Text Data Exploration

In [1]:
import pandas as pd
import numpy as np
import matplotlib.pyplot as plt
import seaborn as sns
import requests
import json
import chart_studio.plotly as py
import plotly.express as px
import plotly.figure_factory as ff

Retrieve Text Data From Firebase

In [4]:
test_url = 'https://finalproject-42236-default-rtdb.firebaseio.com/test.json'
response = requests.get(test_url)
text_test = response.json()
test_t = pd.DataFrame.from_dict(text_test, orient='columns')
In [5]:
train_url = 'https://finalproject-42236-default-rtdb.firebaseio.com/train.json'
response = requests.get(train_url)
text_train = response.json()
train_t = pd.DataFrame.from_dict(text_train, orient='columns')

Interactive Data Visulization

Data Distribution

For training data

In [29]:
for col in train_t.columns:
    fig = px.histogram(train_t, x=col)
    fig.show()

For testing data

In [30]:
for col in test_t.columns:
    fig = px.histogram(test_t, x=col)
    fig.show()

Scatter Plot

For training data

In [6]:
sns.pairplot(train_t, hue="Group")
Out[6]:
<seaborn.axisgrid.PairGrid at 0x1a237a3b50>

For testing data

In [39]:
sns.pairplot(test_t, hue="Group")
Out[39]:
<seaborn.axisgrid.PairGrid at 0x1a27b08f10>